Implement generic notiication hold-off in the ring macros

author kaf24@firebug.cl.cam.ac.uk <kaf24@firebug.cl.cam.ac.uk>

Thu, 1 Dec 2005 19:23:07 +0000 (20:23 +0100)

committer kaf24@firebug.cl.cam.ac.uk <kaf24@firebug.cl.cam.ac.uk>

Thu, 1 Dec 2005 19:23:07 +0000 (20:23 +0100)
author kaf24@firebug.cl.cam.ac.uk <kaf24@firebug.cl.cam.ac.uk>
Thu, 1 Dec 2005 19:23:07 +0000 (20:23 +0100)
committer kaf24@firebug.cl.cam.ac.uk <kaf24@firebug.cl.cam.ac.uk>
Thu, 1 Dec 2005 19:23:07 +0000 (20:23 +0100)
diff --git a/linux-2.6-xen-sparse/drivers/xen/blkback/blkback.c b/linux-2.6-xen-sparse/drivers/xen/blkback/blkback.c

index 586ce79d986835dca8ae236220ac1d71b9ce7abd..bbe6d29acd8152b84954dc22d94eb4e2bb300077 100644 (file)
--- a/linux-2.6-xen-sparse/drivers/xen/blkback/blkback.c
+++ b/linux-2.6-xen-sparse/drivers/xen/blkback/blkback.c
@@ -481,6 +481,7 @@ static void make_response(blkif_t *blkif, unsigned long id,
         blkif_response_t *resp;
         unsigned long     flags;
         blkif_back_ring_t *blk_ring = &blkif->blk_ring;
+       int notify;
  
         /* Place on the response ring for the relevant domain. */ 
         spin_lock_irqsave(&blkif->blk_ring_lock, flags);
@@ -488,13 +489,23 @@ static void make_response(blkif_t *blkif, unsigned long id,
         resp->id        = id;
         resp->operation = op;
         resp->status    = st;
-       wmb(); /* Ensure other side can see the response fields. */
         blk_ring->rsp_prod_pvt++;
-       RING_PUSH_RESPONSES(blk_ring);
+       RING_PUSH_RESPONSES_AND_CHECK_NOTIFY(blk_ring, notify);
         spin_unlock_irqrestore(&blkif->blk_ring_lock, flags);
  
-       /* Kick the relevant domain. */
-       notify_remote_via_irq(blkif->irq);
+       /*
+         * Tail check for pending requests. Allows frontend to avoid
+         * notifications if requests are already in flight (lower overheads
+         * and promotes batching).
+         */
+       if (!__on_blkdev_list(blkif) &&
+           RING_HAS_UNCONSUMED_REQUESTS(blk_ring)) {
+               add_to_blkdev_list_tail(blkif);
+               maybe_trigger_blkio_schedule();
+       }
+
+       if (notify)
+               notify_remote_via_irq(blkif->irq);
  }
  
  void blkif_deschedule(blkif_t *blkif)
diff --git a/linux-2.6-xen-sparse/drivers/xen/blkfront/blkfront.c b/linux-2.6-xen-sparse/drivers/xen/blkfront/blkfront.c

index 447ad6b9b0f530634365738c70d32eb0352ad2ea..7357d14b60f8bd8aca8b6da1630c996f65c98688 100644 (file)
--- a/linux-2.6-xen-sparse/drivers/xen/blkfront/blkfront.c
+++ b/linux-2.6-xen-sparse/drivers/xen/blkfront/blkfront.c
@@ -394,8 +394,17 @@ static inline void ADD_ID_TO_FREELIST(
  
  static inline void flush_requests(struct blkfront_info *info)
  {
+       RING_IDX old_prod = info->ring.sring->req_prod;
+
         RING_PUSH_REQUESTS(&info->ring);
-       notify_remote_via_irq(info->irq);
+
+       /*
+         * Send new requests /then/ check if any old requests are still in
+         * flight. If so then there is no need to send a notification.
+         */
+       mb();
+       if (info->ring.sring->rsp_prod == old_prod)
+               notify_remote_via_irq(info->irq);
  }
  
  static void kick_pending_request_queues(struct blkfront_info *info)
@@ -631,6 +640,7 @@ static irqreturn_t blkif_int(int irq, void *dev_id, struct pt_regs *ptregs)
                 return IRQ_HANDLED;
         }
  
+ again:
         rp = info->ring.sring->rsp_prod;
         rmb(); /* Ensure we see queued responses up to 'rp'. */
  
@@ -666,6 +676,15 @@ static irqreturn_t blkif_int(int irq, void *dev_id, struct pt_regs *ptregs)
  
         info->ring.rsp_cons = i;
  
+       if (i != info->ring.req_prod_pvt) {
+               int more_to_do;
+               RING_FINAL_CHECK_FOR_RESPONSES(&info->ring, more_to_do);
+               if (more_to_do)
+                       goto again;
+       } else {
+               info->ring.sring->rsp_event = i + 1;
+       }
+
         kick_pending_request_queues(info);
  
         spin_unlock_irqrestore(&blkif_io_lock, flags);
@@ -751,9 +770,6 @@ static void blkif_recover(struct blkfront_info *info)
  
         kfree(copy);
  
-       /* info->ring->req_prod will be set when we flush_requests().*/
-       wmb();
-
         /* Kicks things back into life. */
         flush_requests(info);
  
diff --git a/linux-2.6-xen-sparse/drivers/xen/blktap/blktap.c b/linux-2.6-xen-sparse/drivers/xen/blktap/blktap.c

index f4c80f22b4014aacfddbe356b629e211d45d0ec2..299a4a5a5971bd5311fc6522cf13dffec9d359ea 100644 (file)
--- a/linux-2.6-xen-sparse/drivers/xen/blktap/blktap.c
+++ b/linux-2.6-xen-sparse/drivers/xen/blktap/blktap.c
@@ -375,7 +375,7 @@ static int blktap_ioctl(struct inode *inode, struct file *filp,
  static unsigned int blktap_poll(struct file *file, poll_table *wait)
  {
         poll_wait(file, &blktap_wait, wait);
-       if (RING_HAS_UNPUSHED_REQUESTS(&blktap_ufe_ring)) {
+       if (blktap_ufe_ring.req_prod_pvt != blktap_ufe_ring.sring->req_prod) {
                 flush_tlb_all();
                 RING_PUSH_REQUESTS(&blktap_ufe_ring);
                 return POLLIN | POLLRDNORM;
diff --git a/linux-2.6-xen-sparse/drivers/xen/netback/netback.c b/linux-2.6-xen-sparse/drivers/xen/netback/netback.c

index c8e8ad7dd2835fa4653969286ad9ef11a5899a11..a4d443923952d8bc904c2ca7af77bf4070b80db4 100644 (file)
--- a/linux-2.6-xen-sparse/drivers/xen/netback/netback.c
+++ b/linux-2.6-xen-sparse/drivers/xen/netback/netback.c
@@ -44,9 +44,6 @@ static mmu_update_t rx_mmu[NET_RX_RING_SIZE];
  static gnttab_transfer_t grant_rx_op[MAX_PENDING_REQS];
  static unsigned char rx_notify[NR_IRQS];
  
-/* Don't currently gate addition of an interface to the tx scheduling list. */
-#define tx_work_exists(_if) (1)
-
  static unsigned long mmap_vstart;
  #define MMAP_VADDR(_req) (mmap_vstart + ((_req) * PAGE_SIZE))
  
@@ -377,25 +374,22 @@ static void add_to_net_schedule_list_tail(netif_t *netif)
   * aggressive in avoiding new-packet notifications -- frontend only needs to
   * send a notification if there are no outstanding unreceived responses.
   * If we may be buffer transmit buffers for any reason then we must be rather
- * more conservative and advertise that we are 'sleeping' this connection here.
+ * more conservative and treat this as the final check for pending work.
   */
  void netif_schedule_work(netif_t *netif)
  {
-       if (RING_HAS_UNCONSUMED_REQUESTS(&netif->tx)) {
+       int more_to_do;
+
+#ifdef CONFIG_XEN_NETDEV_PIPELINED_TRANSMITTER
+       more_to_do = RING_HAS_UNCONSUMED_REQUESTS(&netif->tx);
+#else
+       RING_FINAL_CHECK_FOR_REQUESTS(&netif->tx, more_to_do);
+#endif
+
+       if (more_to_do) {
                 add_to_net_schedule_list_tail(netif);
                 maybe_schedule_tx_action();
         }
-#ifndef CONFIG_XEN_NETDEV_PIPELINED_TRANSMITTER
-       else {
-               netif->tx.sring->server_is_sleeping = 1;
-               mb();
-               if (RING_HAS_UNCONSUMED_REQUESTS(&netif->tx)) {
-                       netif->tx.sring->server_is_sleeping = 0;
-                       add_to_net_schedule_list_tail(netif);
-                       maybe_schedule_tx_action();
-               }
-       }
-#endif
  }
  
  void netif_deschedule_work(netif_t *netif)
@@ -447,26 +441,6 @@ inline static void net_tx_action_dealloc(void)
          
                 pending_ring[MASK_PEND_IDX(pending_prod++)] = pending_idx;
  
-               /*
-                * Scheduling checks must happen after the above response is
-                * posted. This avoids a possible race with a guest OS on
-                * another CPU if that guest is testing against 'resp_prod'
-                * when deciding whether to notify us when it queues additional
-                 * packets.
-                */
-               mb();
-
-               if (RING_HAS_UNCONSUMED_REQUESTS(&netif->tx)) {
-                       add_to_net_schedule_list_tail(netif);
-               } else {
-                       netif->tx.sring->server_is_sleeping = 1;
-                       mb();
-                       if (RING_HAS_UNCONSUMED_REQUESTS(&netif->tx)) {
-                               netif->tx.sring->server_is_sleeping = 0;
-                               add_to_net_schedule_list_tail(netif);
-                       }
-               }
-
                 netif_put(netif);
         }
  }
@@ -482,7 +456,7 @@ static void net_tx_action(unsigned long unused)
         RING_IDX i;
         gnttab_map_grant_ref_t *mop;
         unsigned int data_len;
-       int ret;
+       int ret, work_to_do;
  
         if (dealloc_cons != dealloc_prod)
                 net_tx_action_dealloc();
@@ -496,8 +470,8 @@ static void net_tx_action(unsigned long unused)
                 netif_get(netif);
                 remove_from_net_schedule_list(netif);
  
-               /* Work to do? */
-               if (!RING_HAS_UNCONSUMED_REQUESTS(&netif->tx)) {
+               RING_FINAL_CHECK_FOR_REQUESTS(&netif->tx, work_to_do);
+               if (!work_to_do) {
                         netif_put(netif);
                         continue;
                 }
@@ -695,10 +669,8 @@ static void netif_page_release(struct page *page)
  irqreturn_t netif_be_int(int irq, void *dev_id, struct pt_regs *regs)
  {
         netif_t *netif = dev_id;
-       if (tx_work_exists(netif)) {
-               add_to_net_schedule_list_tail(netif);
-               maybe_schedule_tx_action();
-       }
+       add_to_net_schedule_list_tail(netif);
+       maybe_schedule_tx_action();
         return IRQ_HANDLED;
  }
  
@@ -708,17 +680,25 @@ static void make_tx_response(netif_t *netif,
  {
         RING_IDX i = netif->tx.rsp_prod_pvt;
         netif_tx_response_t *resp;
+       int notify;
  
         resp = RING_GET_RESPONSE(&netif->tx, i);
         resp->id     = id;
         resp->status = st;
-       wmb();
-       netif->tx.rsp_prod_pvt = ++i;
-       RING_PUSH_RESPONSES(&netif->tx);
  
-       mb(); /* Update producer before checking event threshold. */
-       if (i == netif->tx.sring->rsp_event)
+       netif->tx.rsp_prod_pvt = ++i;
+       RING_PUSH_RESPONSES_AND_CHECK_NOTIFY(&netif->tx, notify);
+       if (notify)
                 notify_remote_via_irq(netif->irq);
+
+#ifdef CONFIG_XEN_NETDEV_PIPELINED_TRANSMITTER
+       if (i == netif->tx.req_cons) {
+               int more_to_do;
+               RING_FINAL_CHECK_FOR_REQUESTS(&netif->tx, more_to_do);
+               if (more_to_do)
+                       add_to_net_schedule_list_tail(netif);
+       }
+#endif
  }
  
  static int make_rx_response(netif_t *netif, 
@@ -730,6 +710,7 @@ static int make_rx_response(netif_t *netif,
  {
         RING_IDX i = netif->rx.rsp_prod_pvt;
         netif_rx_response_t *resp;
+       int notify;
  
         resp = RING_GET_RESPONSE(&netif->rx, i);
         resp->offset     = offset;
@@ -738,12 +719,11 @@ static int make_rx_response(netif_t *netif,
         resp->status     = (s16)size;
         if (st < 0)
                 resp->status = (s16)st;
-       wmb();
+
         netif->rx.rsp_prod_pvt = ++i;
-       RING_PUSH_RESPONSES(&netif->rx);
+       RING_PUSH_RESPONSES_AND_CHECK_NOTIFY(&netif->rx, notify);
  
-       mb(); /* Update producer before checking event threshold. */
-       return (i == netif->rx.sring->rsp_event);
+       return notify;
  }
  
  static irqreturn_t netif_be_dbg(int irq, void *dev_id, struct pt_regs *regs)
diff --git a/linux-2.6-xen-sparse/drivers/xen/netfront/netfront.c b/linux-2.6-xen-sparse/drivers/xen/netfront/netfront.c

index f773df408f9c115289ca285e57b4f917767b4fcd..e71d800c732aca42fc1f784cd59b43042d4c2cd2 100644 (file)
--- a/linux-2.6-xen-sparse/drivers/xen/netfront/netfront.c
+++ b/linux-2.6-xen-sparse/drivers/xen/netfront/netfront.c
@@ -616,6 +616,7 @@ static int network_start_xmit(struct sk_buff *skb, struct net_device *dev)
         RING_IDX i;
         grant_ref_t ref;
         unsigned long mfn;
+       int notify;
  
         if (unlikely(np->tx_full)) {
                 printk(KERN_ALERT "%s: full queue wasn't stopped!\n",
@@ -661,9 +662,10 @@ static int network_start_xmit(struct sk_buff *skb, struct net_device *dev)
         tx->size = skb->len;
         tx->csum_blank = (skb->ip_summed == CHECKSUM_HW);
  
-       wmb(); /* Ensure that backend will see the request. */
         np->tx.req_prod_pvt = i + 1;
-       RING_PUSH_REQUESTS(&np->tx);
+       RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&np->tx, notify);
+       if (notify)
+               notify_remote_via_irq(np->irq);
  
         network_tx_buf_gc(dev);
  
@@ -677,13 +679,6 @@ static int network_start_xmit(struct sk_buff *skb, struct net_device *dev)
         np->stats.tx_bytes += skb->len;
         np->stats.tx_packets++;
  
-       /* Only notify Xen if we really have to. */
-       mb();
-       if (np->tx.sring->server_is_sleeping) {
-               np->tx.sring->server_is_sleeping = 0;
-               notify_remote_via_irq(np->irq);
-       }
-
         return 0;
  
   drop:
@@ -761,7 +756,8 @@ static int netif_poll(struct net_device *dev, int *pbudget)
                                         rx->id, rx->status);
                         RING_GET_REQUEST(&np->rx, np->rx.req_prod_pvt)->id =
                                 rx->id;
-                       wmb();
+                       RING_GET_REQUEST(&np->rx, np->rx.req_prod_pvt)->gref =
+                               ref;
                         np->rx.req_prod_pvt++;
                         RING_PUSH_REQUESTS(&np->rx);
                         work_done--;
@@ -882,14 +878,9 @@ static int netif_poll(struct net_device *dev, int *pbudget)
         if (work_done < budget) {
                 local_irq_save(flags);
  
-               np->rx.sring->rsp_event = i + 1;
-    
-               /* Deal with hypervisor racing our resetting of rx_event. */
-               mb();
-               if (np->rx.sring->rsp_prod == i) {
+               RING_FINAL_CHECK_FOR_RESPONSES(&np->rx, more_to_do);
+               if (!more_to_do)
                         __netif_rx_complete(dev);
-                       more_to_do = 0;
-               }
  
                 local_irq_restore(flags);
         }
@@ -930,7 +921,6 @@ static void network_connect(struct net_device *dev)
  
         /* Step 1: Reinitialise variables. */
         np->tx_full = 0;
-       np->rx.sring->rsp_event = np->tx.sring->rsp_event = 1;
  
         /*
          * Step 2: Rebuild the RX and TX ring contents.
@@ -972,7 +962,7 @@ static void network_connect(struct net_device *dev)
                 np->stats.tx_bytes += skb->len;
                 np->stats.tx_packets++;
         }
-       wmb();
+
         np->tx.req_prod_pvt = requeue_idx;
         RING_PUSH_REQUESTS(&np->tx);
  
@@ -987,7 +977,7 @@ static void network_connect(struct net_device *dev)
                 RING_GET_REQUEST(&np->rx, requeue_idx)->id = i;
                 requeue_idx++; 
         }
-       wmb();                
+
         np->rx.req_prod_pvt = requeue_idx;
         RING_PUSH_REQUESTS(&np->rx);
  
@@ -998,7 +988,6 @@ static void network_connect(struct net_device *dev)
          * packets.
          */
         np->backend_state = BEST_CONNECTED;
-       wmb();
         notify_remote_via_irq(np->irq);
         network_tx_buf_gc(dev);
  
diff --git a/xen/include/public/io/blkif.h b/xen/include/public/io/blkif.h

index 9a91ef82f996e2f61969e63d683cdc807fc8ca9d..924c9d357c95dc3e4bc7dcdc4abe7153a9373383 100644 (file)
--- a/xen/include/public/io/blkif.h
+++ b/xen/include/public/io/blkif.h
@@ -11,6 +11,19 @@
  
  #include "ring.h"
  
+/*
+ * Front->back notifications: When enqueuing a new request, there is no
+ * need to send a notification if there are old requests still in flight
+ * (that is, old_req_prod != sring->rsp_prod). The backend guarantees to check
+ * for new requests after queuing the response for the last in-flight request.
+ * (NB. The generic req_event mechanism is not used for blk requests.)
+ * 
+ * Back->front notifications: When enqueuing a new response, sending a
+ * notification can be made conditional on rsp_event (i.e., the generic
+ * hold-off mechanism provided by the ring macros). Frontends must set
+ * rsp_event appropriately (e.g., using RING_FINAL_CHECK_FOR_RESPONSES()).
+ */
+
  #ifndef blkif_vdev_t
  #define blkif_vdev_t   uint16_t
  #endif
diff --git a/xen/include/public/io/netif.h b/xen/include/public/io/netif.h

index 2f899a3b65e3fdd3342794408f0190bfe05a31ae..70ad3227b430852bb3e6b56a734727d83667e3f0 100644 (file)
--- a/xen/include/public/io/netif.h
+++ b/xen/include/public/io/netif.h
@@ -11,6 +11,13 @@
  
  #include "ring.h"
  
+/*
+ * Note that there is *never* any need to notify the backend when enqueuing
+ * receive requests (netif_rx_request_t). Notifications after enqueuing any
+ * other type of message should be conditional on the appropriate req_event
+ * or rsp_event field in the shared ring.
+ */
+
  typedef struct netif_tx_request {
      grant_ref_t gref;      /* Reference to buffer page */
      uint16_t offset:15;    /* Offset within buffer page */
diff --git a/xen/include/public/io/ring.h b/xen/include/public/io/ring.h

index 1f333850b332dffb13b9824ef56892c4089656e8..6f1df572d3e388a3572798f6ac392b167818d445 100644 (file)
--- a/xen/include/public/io/ring.h
+++ b/xen/include/public/io/ring.h
@@ -1,10 +1,10 @@
-
-
-
-/*
+/******************************************************************************
+ * ring.h
+ * 
   * Shared producer-consumer ring macros.
+ *
   * Tim Deegan and Andrew Warfield November 2004.
- */ 
+ */
  
  #ifndef __XEN_PUBLIC_IO_RING_H__
  #define __XEN_PUBLIC_IO_RING_H__
@@ -28,32 +28,35 @@ typedef unsigned int RING_IDX;
      (__RD32(((_sz) - (long)&(_s)->ring + (long)(_s)) / sizeof((_s)->ring[0])))
  
  /*
- *  Macros to make the correct C datatypes for a new kind of ring.
+ * Macros to make the correct C datatypes for a new kind of ring.
   * 
- *  To make a new ring datatype, you need to have two message structures,
- *  let's say request_t, and response_t already defined.
+ * To make a new ring datatype, you need to have two message structures,
+ * let's say request_t, and response_t already defined.
   *
- *  In a header where you want the ring datatype declared, you then do:
+ * In a header where you want the ring datatype declared, you then do:
   *
   *     DEFINE_RING_TYPES(mytag, request_t, response_t);
   *
- *  These expand out to give you a set of types, as you can see below.
- *  The most important of these are:
+ * These expand out to give you a set of types, as you can see below.
+ * The most important of these are:
   *  
   *     mytag_sring_t      - The shared ring.
   *     mytag_front_ring_t - The 'front' half of the ring.
   *     mytag_back_ring_t  - The 'back' half of the ring.
   *
- *  To initialize a ring in your code you need to know the location and size
- *  of the shared memory area (PAGE_SIZE, for instance). To initialise
- *  the front half:
+ * To initialize a ring in your code you need to know the location and size
+ * of the shared memory area (PAGE_SIZE, for instance). To initialise
+ * the front half:
   *
- *      mytag_front_ring_t front_ring;
+ *     mytag_front_ring_t front_ring;
+ *     SHARED_RING_INIT((mytag_sring_t *)shared_page);
+ *     FRONT_RING_INIT(&front_ring, (mytag_sring_t *)shared_page, PAGE_SIZE);
   *
- *      SHARED_RING_INIT((mytag_sring_t *)shared_page);
- *      FRONT_RING_INIT(&front_ring, (mytag_sring_t *)shared_page, PAGE_SIZE);
+ * Initializing the back follows similarly (note that only the front
+ * initializes the shared ring):
   *
- *  Initializing the back follows similarly...
+ *     mytag_back_ring_t back_ring;
+ *     BACK_RING_INIT(&back_ring, (mytag_sring_t *)shared_page, PAGE_SIZE);
   */
           
  #define DEFINE_RING_TYPES(__name, __req_t, __rsp_t)                     \
@@ -66,10 +69,8 @@ union __name##_sring_entry {                                            \
                                                                          \
  /* Shared ring page */                                                  \
  struct __name##_sring {                                                 \
-    RING_IDX req_prod;                                                  \
-    RING_IDX rsp_prod;                                                  \
-    RING_IDX rsp_event; /* notify client when rsp_prod == rsp_event */  \
-    uint8_t  server_is_sleeping; /* notify server to kick off work  */  \
+    RING_IDX req_prod, req_event;                                       \
+    RING_IDX rsp_prod, rsp_event;                                       \
      union __name##_sring_entry ring[1]; /* variable-length */           \
  };                                                                      \
                                                                          \
@@ -95,24 +96,24 @@ typedef struct __name##_front_ring __name##_front_ring_t;               \
  typedef struct __name##_back_ring __name##_back_ring_t
  
  /*
- *   Macros for manipulating rings.  
+ * Macros for manipulating rings.  
   * 
- *   FRONT_RING_whatever works on the "front end" of a ring: here 
- *   requests are pushed on to the ring and responses taken off it.
+ * FRONT_RING_whatever works on the "front end" of a ring: here 
+ * requests are pushed on to the ring and responses taken off it.
   * 
- *   BACK_RING_whatever works on the "back end" of a ring: here 
- *   requests are taken off the ring and responses put on.
+ * BACK_RING_whatever works on the "back end" of a ring: here 
+ * requests are taken off the ring and responses put on.
   * 
- *   N.B. these macros do NO INTERLOCKS OR FLOW CONTROL.  
- *   This is OK in 1-for-1 request-response situations where the 
- *   requestor (front end) never has more than RING_SIZE()-1
- *   outstanding requests.
+ * N.B. these macros do NO INTERLOCKS OR FLOW CONTROL.  
+ * This is OK in 1-for-1 request-response situations where the 
+ * requestor (front end) never has more than RING_SIZE()-1
+ * outstanding requests.
   */
  
  /* Initialising empty rings */
  #define SHARED_RING_INIT(_s) do {                                       \
-    (_s)->req_prod = 0;                                                 \
-    (_s)->rsp_prod = 0;                                                 \
+    (_s)->req_prod  = (_s)->rsp_prod  = 0;                              \
+    (_s)->req_event = (_s)->rsp_event = 1;                              \
  } while(0)
  
  #define FRONT_RING_INIT(_r, _s, __size) do {                            \
@@ -148,10 +149,6 @@ typedef struct __name##_back_ring __name##_back_ring_t
  #define RING_SIZE(_r)                                                   \
      ((_r)->nr_ents)
  
-/* How many empty slots are on a ring? */
-#define RING_PENDING_REQUESTS(_r)                                       \
-   ( ((_r)->req_prod_pvt - (_r)->rsp_cons) )
-   
  /* Test if there is an empty slot available on the front ring. 
   * (This is only meaningful from the front. )
   */
@@ -167,25 +164,6 @@ typedef struct __name##_back_ring __name##_back_ring_t
       (((_r)->req_cons - (_r)->rsp_prod_pvt) !=                          \
        RING_SIZE(_r)) )
        
-/* Test if there are messages waiting to be pushed. */
-#define RING_HAS_UNPUSHED_REQUESTS(_r)                                  \
-   ( (_r)->req_prod_pvt != (_r)->sring->req_prod )
-   
-#define RING_HAS_UNPUSHED_RESPONSES(_r)                                 \
-   ( (_r)->rsp_prod_pvt != (_r)->sring->rsp_prod )
-
-/* Copy the private producer pointer into the shared ring so the other end 
- * can see the updates we've made. */
-#define RING_PUSH_REQUESTS(_r) do {                                     \
-    wmb();                                                              \
-    (_r)->sring->req_prod = (_r)->req_prod_pvt;                         \
-} while (0)
-
-#define RING_PUSH_RESPONSES(_r) do {                                    \
-    wmb();                                                              \
-    (_r)->sring->rsp_prod = (_r)->rsp_prod_pvt;                         \
-} while (0)
-
  /* Direct access to individual ring elements, by index. */
  #define RING_GET_REQUEST(_r, _idx)                                      \
   (&((_r)->sring->ring[                                                  \
@@ -201,6 +179,82 @@ typedef struct __name##_back_ring __name##_back_ring_t
  #define RING_REQUEST_CONS_OVERFLOW(_r, _cons)                           \
      (((_cons) - (_r)->rsp_prod_pvt) >= RING_SIZE(_r))
  
+#define RING_PUSH_REQUESTS(_r) do {                                     \
+    wmb(); /* back sees requests /before/ updated producer index */     \
+    (_r)->sring->req_prod = (_r)->req_prod_pvt;                         \
+} while (0)
+
+#define RING_PUSH_RESPONSES(_r) do {                                    \
+    wmb(); /* front sees responses /before/ updated producer index */   \
+    (_r)->sring->rsp_prod = (_r)->rsp_prod_pvt;                         \
+} while (0)
+
+/*
+ * Notification hold-off (req_event and rsp_event):
+ * 
+ * When queueing requests or responses on a shared ring, it may not always be
+ * necessary to notify the remote end. For example, if requests are in flight
+ * in a backend, the front may be able to queue further requests without
+ * notifying the back (if the back checks for new requests when it queues
+ * responses).
+ * 
+ * When enqueuing requests or responses:
+ * 
+ *  Use RING_PUSH_{REQUESTS,RESPONSES}_AND_CHECK_NOTIFY(). The second argument
+ *  is a boolean return value. True indicates that the receiver requires an
+ *  asynchronous notification.
+ * 
+ * After dequeuing requests or responses (before sleeping the connection):
+ * 
+ *  Use RING_FINAL_CHECK_FOR_REQUESTS() or RING_FINAL_CHECK_FOR_RESPONSES().
+ *  The second argument is a boolean return value. True indicates that there
+ *  are pending messages on the ring (i.e., the connection should not be put
+ *  to sleep).
+ *  
+ *  These macros will set the req_event/rsp_event field to trigger a
+ *  notification on the very next message that is enqueued. If you want to
+ *  create batches of work (i.e., only receive a notification after several
+ *  messages have been enqueued) then you will need to create a customised
+ *  version of the FINAL_CHECK macro in your own code, which sets the event
+ *  field appropriately.
+ */
+
+#define RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(_r, _notify) do {           \
+    RING_IDX __old = (_r)->sring->req_prod;                             \
+    RING_IDX __new = (_r)->req_prod_pvt;                                \
+    wmb(); /* back sees requests /before/ updated producer index */     \
+    (_r)->sring->req_prod = __new;                                      \
+    mb(); /* back sees new requests /before/ we check req_event */      \
+    (_notify) = ((RING_IDX)(__new - (_r)->sring->req_event) <           \
+                 (RING_IDX)(__new - __old));                            \
+} while (0)
+
+#define RING_PUSH_RESPONSES_AND_CHECK_NOTIFY(_r, _notify) do {          \
+    RING_IDX __old = (_r)->sring->rsp_prod;                             \
+    RING_IDX __new = (_r)->rsp_prod_pvt;                                \
+    wmb(); /* front sees responses /before/ updated producer index */   \
+    (_r)->sring->rsp_prod = __new;                                      \
+    mb(); /* front sees new responses /before/ we check rsp_event */    \
+    (_notify) = ((RING_IDX)(__new - (_r)->sring->rsp_event) <           \
+                 (RING_IDX)(__new - __old));                            \
+} while (0)
+
+#define RING_FINAL_CHECK_FOR_REQUESTS(_r, _work_to_do) do {             \
+    (_work_to_do) = RING_HAS_UNCONSUMED_REQUESTS(_r);                   \
+    if (_work_to_do) break;                                             \
+    (_r)->sring->req_event = (_r)->req_cons + 1;                        \
+    mb();                                                               \
+    (_work_to_do) = RING_HAS_UNCONSUMED_REQUESTS(_r);                   \
+} while (0)
+
+#define RING_FINAL_CHECK_FOR_RESPONSES(_r, _work_to_do) do {            \
+    (_work_to_do) = RING_HAS_UNCONSUMED_RESPONSES(_r);                  \
+    if (_work_to_do) break;                                             \
+    (_r)->sring->rsp_event = (_r)->rsp_cons + 1;                        \
+    mb();                                                               \
+    (_work_to_do) = RING_HAS_UNCONSUMED_RESPONSES(_r);                  \
+} while (0)
+
  #endif /* __XEN_PUBLIC_IO_RING_H__ */
  
  /*
author	kaf24@firebug.cl.cam.ac.uk <kaf24@firebug.cl.cam.ac.uk>
	Thu, 1 Dec 2005 19:23:07 +0000 (20:23 +0100)
committer	kaf24@firebug.cl.cam.ac.uk <kaf24@firebug.cl.cam.ac.uk>
	Thu, 1 Dec 2005 19:23:07 +0000 (20:23 +0100)
linux-2.6-xen-sparse/drivers/xen/blkback/blkback.c		patch \| blob \| history
linux-2.6-xen-sparse/drivers/xen/blkfront/blkfront.c		patch \| blob \| history
linux-2.6-xen-sparse/drivers/xen/blktap/blktap.c		patch \| blob \| history
linux-2.6-xen-sparse/drivers/xen/netback/netback.c		patch \| blob \| history
linux-2.6-xen-sparse/drivers/xen/netfront/netfront.c		patch \| blob \| history
xen/include/public/io/blkif.h		patch \| blob \| history
xen/include/public/io/netif.h		patch \| blob \| history
xen/include/public/io/ring.h		patch \| blob \| history